model.embed_tokens.weight_quantizer TensorQuantizer(disabled) model.embed_tokens.input_quantizer HardDisabledTensorQuantizer(disabled) model.embed_tokens.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.0.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.0.mlp.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.mlp.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.mlp.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.mlp.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.mlp.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.mlp.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.0.mlp.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.0.mlp.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.0.mlp.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.1.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.1.mlp.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.mlp.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.mlp.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.mlp.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.mlp.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.mlp.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.1.mlp.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.1.mlp.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.1.mlp.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.2.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.2.mlp.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.mlp.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.mlp.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.mlp.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.mlp.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.mlp.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.2.mlp.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.2.mlp.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.2.mlp.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.3.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.3.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.72e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.31e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.18e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e+00 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e+00 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.01e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.11e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.15e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.87e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.91e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.15e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.3.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.3.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.3.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.4.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.4.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e+00 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.4.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.4.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.4.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.5.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.5.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.50e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e+00 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.68e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.89e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.45e-01 calibrator=MaxCalibrator quant) model.layers.5.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.5.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.6.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.6.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e+00 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.82e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.69e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e+00 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.6.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.6.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.7.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.7.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e+00 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.84e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.48e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.66e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e+00 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e+00 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.88e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.98e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.79e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.21e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.7.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.7.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.8.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.8.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.88e+00 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.96e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.17e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.88e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.76e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e+02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.36e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.25e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.70e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.8.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.8.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.8.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.9.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.9.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.06e+00 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.28e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.30e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.41e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.19e+00 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.9.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.9.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.9.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.10.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.10.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.31e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e+00 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.86e+00 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.47e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.10.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.10.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.10.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.11.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.11.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e+00 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e+00 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.11.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.11.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.12.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.12.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e+00 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.86e+00 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.55e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.12.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.12.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.13.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.13.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e+00 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.72e+00 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.13.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.13.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.14.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.14.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e+00 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.65e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.94e+00 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.14.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.14.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.15.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.15.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e+00 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.98e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.77e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.98e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.83e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.88e+00 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.94e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.15.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.15.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.16.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.16.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e+00 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.51e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.16.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.16.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.17.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.17.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.69e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.91e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.62e+00 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.17.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.17.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.17.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.18.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.18.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e+00 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.38e+00 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.18.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.18.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.19.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.19.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.73e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.14e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.61e+00 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.19.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.19.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.19.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.20.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.20.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.80e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.90e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.18e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.82e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.10e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.63e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.16e+00 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.20.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.20.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.20.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.21.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.21.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.22e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.56e+00 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.21.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.21.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.22.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.22.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.79e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.10e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.53e+00 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.22.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.22.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.22.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.23.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.23.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.67e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.79e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.34e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.84e+00 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.23.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.23.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.23.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.24.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.24.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.26e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e+01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.24.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.24.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.25.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.25.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.73e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.34e+00 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.20e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.16e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.25.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.25.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.26.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.26.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.91e+00 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.26.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.26.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.27.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.27.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e+00 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.06e+00 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.27.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.27.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.27.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.28.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.28.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e+00 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.50e+00 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.28.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.28.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.28.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.29.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.29.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e+00 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.32e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.85e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e+01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.63e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.63e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.48e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.29.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.29.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.30.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.30.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e+00 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.33e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.15e+01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.06e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.20e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.30.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.30.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.31.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.31.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e+00 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.50e+00 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.23e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.31.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.31.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.32.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.32.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e+00 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.70e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e+01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.06e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.32.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.32.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.33.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.33.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e+00 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.83e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.47e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e+02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.63e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.33.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.33.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.34.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.34.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e+00 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.48e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.59e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.91e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.91e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.65e+01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.34.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.34.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.34.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.35.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.35.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e+00 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.65e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.88e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.12e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.23e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e+01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.35.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.35.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.35.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.36.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.36.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e+00 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.79e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.47e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.55e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.59e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.48e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.20e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e+01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.36.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.36.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.36.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.37.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.37.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e+00 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.86e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.65e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.79e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.86e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e+01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.75e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.37.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.37.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.38.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.38.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e+00 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.07e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.98e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.61e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e+01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.77e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.38.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.38.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.39.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.39.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e+00 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.69e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.79e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.51e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.41e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.87e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.89e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.26e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.48e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.61e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e+01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.39.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.39.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.39.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.40.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.40.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e+00 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.26e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.27e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.59e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.21e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e+01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.40.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.40.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.41.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.41.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e+00 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.94e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.53e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.43e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.16e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e+01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.98e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.41.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.41.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.41.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.42.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.42.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e+00 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.30e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.73e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.14e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e+01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.42.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.42.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.42.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.43.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.43.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e+00 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.43e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.96e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.69e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.10e+01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.11e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.89e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.43.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.43.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.43.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.44.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.44.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e+00 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.55e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.53e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.91e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.34e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e+01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.16e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.44.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.44.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.45.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.45.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.55e+00 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.30e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.79e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.86e+01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.49e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.45.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.45.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.46.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.46.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e+00 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.61e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.25e+01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.46.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.46.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.46.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.47.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.47.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e+00 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.48e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.96e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.10e+01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.12e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.20e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.47.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.47.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.48.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.48.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.67e+00 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.84e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.80e+01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.47e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.48.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.48.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.49.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.49.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e+00 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.60e+01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.29e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.61e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.82e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.49.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.49.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.50.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.50.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e+00 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.30e+01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.50.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.50.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.51.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.51.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.80e+00 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e+01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.85e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.87e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.51.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.51.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.51.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.52.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.52.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e+00 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.98e+01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.52.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.52.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.53.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.53.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e+00 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.65e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.69e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e+01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.53.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.53.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.53.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.54.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.54.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.86e+00 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e+01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.54.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.54.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.54.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.55.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.55.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.06e+00 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.88e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.60e+01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.55.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.55.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.56.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.56.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.25e+00 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.12e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.31e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.68e+01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.56.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.56.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.56.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.57.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.57.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e+00 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.36e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.26e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.96e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e+01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.25e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.57.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.57.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.58.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.58.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.41e+00 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.22e+01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.58.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.58.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.59.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.59.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e+00 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.95e+01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.85e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.30e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.59.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.59.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.59.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.60.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.60.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e+00 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.60e+01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.60.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.60.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.60.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.61.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.61.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.33e+00 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.94e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.82e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.47e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.58e+01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.15e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.61.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.61.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.62.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.62.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e+00 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.87e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.10e+01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.35e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.43e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.43e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.62.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.62.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.63.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.63.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.41e+00 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.55e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.65e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e+00 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.20e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.35e+01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.63.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.63.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.63.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.64.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.64.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e+00 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.90e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.70e+01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.68e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.40e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.64.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.64.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.65.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.65.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.88e+00 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.29e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.98e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.92e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.28e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.72e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e+02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.65.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.65.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.65.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.66.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.66.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.66e+00 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.36e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.46e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.51e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.85e+01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.50e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.66.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.66.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.67.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.67.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.70e+00 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.36e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.74e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.58e+01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.45e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.54e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.41e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.16e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.67.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.67.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.68.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.68.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.41e+00 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e+00 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e+00 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.86e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.67e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.51e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.49e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.80e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.55e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.94e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.75e+01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.48e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.79e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.68.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.68.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.68.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.69.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.69.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.56e+00 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.27e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.79e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.68e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.42e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.56e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.61e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.85e+01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.59e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.74e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.28e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.18e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.69.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.69.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.69.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.70.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.70.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e+00 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.88e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.65e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.59e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.39e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.98e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.46e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.20e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.71e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.87e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.33e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e+00 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e+00 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.50e+01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.89e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.57e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.70.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.70.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.70.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.71.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.71.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e+00 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.27e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.86e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.30e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e+00 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.50e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.64e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.32e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.91e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.38e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.46e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.45e+01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.18e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.71.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.71.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.72.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.72.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.66e+00 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e+00 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.70e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.83e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.45e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.66e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.47e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.62e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.76e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.57e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.77e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e+02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.89e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.24e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.25e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.80e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.84e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.72.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.72.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.73.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.73.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e+00 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.65e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.31e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.26e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.79e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.89e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.43e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.47e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.39e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.81e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e+02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.64e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.63e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.13e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.85e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.94e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.73.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.73.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.wq_b.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.wq_b.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.wq_b.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.wk.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.wk.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.wk.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.k_norm.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.k_norm.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.weights_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.weights_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.indexer.weights_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.74.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.74.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.28e+00 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.26e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.63e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e+02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.48e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.69e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.98e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.87e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.79e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.87e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.08e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.45e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.74.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.74.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.75.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.75.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.86e+00 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.75e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.28e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.95e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.47e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e+03 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.82e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.03e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.45e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.72e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.59e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.83e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.50e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.42e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.18e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.36e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.47e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.75e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.23e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.75.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.75.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.76.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.76.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.41e+00 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.99e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.70e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.66e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.94e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.62e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.76e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.88e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.86e+02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.42e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.91e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.96e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.71e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.31e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.57e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.97e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.06e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.96e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.74e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.52e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.57e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.77e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.67e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.00e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.03e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.33e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.51e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.91e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.62e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.38e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.86e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.81e-02 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.07e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.76.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.76.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_a_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_a_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_a_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.kv_a_proj_with_mqa.input_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.kv_a_proj_with_mqa.output_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.kv_a_proj_with_mqa.weight_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.kv_b_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.kv_b_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.kv_b_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.o_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.o_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.o_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.q_bmm_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.k_bmm_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.v_bmm_quantizer TensorQuantizer(disabled) model.layers.77.self_attn.p_bmm_quantizer TensorQuantizer(disabled) model.layers.77.mlp.experts.gate_up_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.09e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.05e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.89e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.33e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.35e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.92e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.63e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.58e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.54e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.78e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.68e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.15e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.56e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.41e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.19e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.85e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.45e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.72e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.15e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.56e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.86e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.26e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.89e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.48e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.51e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.47e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.17e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.39e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.42e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.00e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.21e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.11e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.80e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.50e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.45e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.11e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.88e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.31e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.40e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.19e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.77e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.90e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.95e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.gate_up_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.99e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_input_quantizer TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.42e+03 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.0 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.1 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.17e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.2 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.13e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.3 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.86e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.4 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.51e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.5 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.37e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.6 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.70e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.7 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.30e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.8 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.9 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.10 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.14e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.11 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.02e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.12 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.76e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.13 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.14 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.30e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.15 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.16 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.17 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.60e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.18 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.11e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.19 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.32e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.20 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.29e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.21 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.22 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.23 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.34e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.24 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.28e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.25 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.67e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.26 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.27 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.01e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.28 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.85e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.29 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.69e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.30 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.31 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.32 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.08e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.33 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.35e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.34 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.01e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.35 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.17e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.36 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.79e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.37 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.63e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.38 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.39 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.35e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.40 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.41 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.42 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.43 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.44 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.45 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.67e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.46 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.47 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.48 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.51e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.49 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.50 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.51 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.52 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.83e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.53 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.54 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.16e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.55 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.56 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.91e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.57 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.22e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.58 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.59 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.47e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.60 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.24e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.61 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.62 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.70e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.63 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.64 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.27e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.65 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.66 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.37e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.67 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.68 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.69 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.73e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.70 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.71 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.08e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.72 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.73 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.41e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.74 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.75 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.76 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.77 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.78 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.79 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.95e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.80 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.68e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.81 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.82 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.17e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.83 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.84 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.85 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.37e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.86 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.50e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.87 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.96e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.88 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.36e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.89 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.70e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.90 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.15e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.91 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.92 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.76e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.93 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.94 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.95 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.98e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.96 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.97 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.51e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.98 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.16e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.99 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.21e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.100 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.20e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.101 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.102 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.103 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.34e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.104 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.54e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.105 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.106 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.16e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.107 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.85e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.108 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.61e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.109 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.05e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.110 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.111 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.11e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.112 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.25e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.113 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.86e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.114 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.49e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.115 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.10e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.116 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.98e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.117 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.89e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.118 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.119 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.04e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.120 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.54e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.121 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.122 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.34e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.123 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.32e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.124 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.45e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.125 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.25e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.126 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.03e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.127 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.128 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.129 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.97e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.130 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.60e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.131 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.59e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.132 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.133 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.53e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.134 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.135 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.01e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.136 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.73e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.137 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.02e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.138 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.10e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.139 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.140 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.95e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.141 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.61e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.142 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.91e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.143 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.65e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.144 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.07e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.145 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.146 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.18e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.147 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.73e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.148 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.149 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.78e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.150 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.38e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.151 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.152 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.153 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.98e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.154 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.34e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.155 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.39e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.156 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.157 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.158 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.05e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.159 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.160 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.77e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.161 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.84e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.162 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.16e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.163 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.62e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.164 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.51e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.165 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.01e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.166 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.13e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.167 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.30e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.168 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.169 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.33e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.170 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.171 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.79e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.172 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.35e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.173 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.174 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.14e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.175 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.29e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.176 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.51e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.177 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.178 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.179 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.43e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.180 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.181 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.32e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.182 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.183 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.184 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.91e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.185 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.15e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.186 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.41e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.187 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.23e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.188 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.28e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.189 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.00e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.190 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.191 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.82e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.192 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.193 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.18e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.194 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.69e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.195 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.89e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.196 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.197 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.198 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.199 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.85e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.200 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.201 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.66e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.202 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.52e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.203 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.204 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.20e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.205 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.64e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.206 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.11e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.207 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.44e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.208 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.26e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.209 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.210 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.59e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.211 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.07e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.212 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.72e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.213 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.59e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.214 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.22e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.215 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.216 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.08e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.217 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.218 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.12e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.219 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=7.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.220 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.73e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.221 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.65e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.222 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.223 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.95e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.224 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.225 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.58e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.226 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.08e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.227 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.36e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.228 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.79e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.229 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.46e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.230 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=5.35e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.231 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.62e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.232 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.53e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.233 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.234 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.81e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.235 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=6.09e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.236 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.47e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.237 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.71e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.238 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=4.06e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.239 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.38e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.240 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.03e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.241 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.55e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.242 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.23e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.243 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.27e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.244 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.14e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.245 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.40e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.246 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=9.49e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.247 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=8.05e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.248 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.40e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.249 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.02e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.250 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.44e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.251 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.09e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.252 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=3.75e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.253 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.93e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.254 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=2.13e-01 calibrator=MaxCalibrator quant) model.layers.77.mlp.experts.down_proj_weight_quantizers.255 TensorQuantizer((2, 1) bit fake block_sizes={-1: 16, 'type': 'dynamic', 'scale_bits': (4, 3)}, amax=1.09e+00 calibrator=MaxCalibrator quant) model.layers.77.mlp.shared_experts.gate_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.gate_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.gate_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.up_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.up_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.up_proj.weight_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.down_proj.input_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.down_proj.output_quantizer TensorQuantizer(disabled) model.layers.77.mlp.shared_experts.down_proj.weight_quantizer TensorQuantizer(disabled) lm_head.input_quantizer TensorQuantizer(disabled) lm_head.output_quantizer TensorQuantizer(disabled) lm_head.weight_quantizer TensorQuantizer(disabled) 40971 TensorQuantizers found in model